#!/bin/bash
STREAM=/home/hadoop/hadoop/hadoop_install/contrib/streaming
#==============================================
MAPPER=/home/hadoop/progs/python/step2_tweets_md5/mapper.py
IDENTITY_MAPPER=org.apache.hadoop.mapred.lib.IdentityMapper
REDUCER=/home/hadoop/progs/python/random_reducer.py
FILE=/home/hadoop/progs/python/mylib.py
#==============================================
INPUT=/home/lih307/projects/rt/step_1_tweets_1_unique
OUTPUT=/home/lih307/projects/rt/step_2_tweets_2_md5
#==============================================
REDUCE_NUM=0
#=============================================
hadoop fs -rmr $OUTPUT
hadoop jar $STREAM/hadoop-streaming-1.0.3.jar \
    -input $INPUT \
    -output $OUTPUT \
    -mapper $MAPPER \
    -reducer NONE \
    -file $MAPPER \
    -file $FILE